home *** CD-ROM | disk | FTP | other *** search
/ Mac Magazin/MacEasy 76 / maccd 76.iso / macware / Cyclone 1.3 / Scripting / Encoding Dictionary < prev   
Encoding:
Text File  |  2000-09-24  |  18.5 KB  |  209 lines  |  [TEXT/ToyS]

  1. (*
  2.  
  3. A list of encoding names registered in Cyclone for AppleScript.
  4. This list is based on Apple's <TextCommon.h> and "Programming With the Text Encoding Conversion Manager"
  5. (For Version 1.5).
  6. If you have any problems with names or you will have an encoding not listed here,
  7. you may use raw numbers in your scripts as well (in decimal form, AppleScript does not support hex).
  8. Some of these encodings are not supported by current version of Text Encoding Converter.
  9. Encodings marked with '*' are available with TEC 1.4.2/1.4.3.
  10. Encoding marked with '•' are new in TEC 1.5.
  11.  
  12. Note that spaces and punctation chars are replaced with '_' in names for AppleScript compatibility.
  13.  
  14. Cyclone 1.3 adds Internet name support via TECGetTextEncodingFromInternetName() call,
  15. inheriting all its features and limitations. Internet names are case-insensitive.
  16. Contrary to what TEC documentation says, the Internet name "UTF-16" is not supported by TEC 1.5,
  17. but Cyclone 1.3 checks for "UTF-16" and resolves it properly.
  18. I did not test these names extensively. If you find an Internet name which is not listed here,
  19. but works with TEC, drop me a line <mailto:tkukiel@mac.com>.
  20.  
  21.  
  22. Name:                                  Code:       Internet name:                           Comments:
  23.  
  24. "Mac_Western"                          0x00000000  "mac", "macintosh", "x-mac-roman"     "same as Roman"*
  25. "Mac_Roman"                            0x00000000  "mac", "macintosh", "x-mac-roman"     "Western"*
  26.  "Mac_Roman_Euro_Sign"                 0x00000000  "mac", "macintosh", "x-mac-roman"     ""*
  27.  "Mac_Roman_Old"                       0x00010000     -                                  ""*
  28. "Mac_Japanese"                         0x00000001  "x-mac-japanese"                      ""*
  29.  "Mac_Japanese_Standard"               0x00000001  "x-mac-japanese"                      ""*
  30.  "Mac_Japanese_Standard_No_Verticals"  0x00010001     -                                  ""*
  31.  "Mac_Japanese_Basic"                  0x00020001     -                                  ""*
  32.  "Mac_Japanese_PostScript_Screen"      0x00030001     -                                  ""*
  33.  "Mac_Japanese_PostScript_Print"       0x00040001     -                                  ""*
  34.  "Mac_Japanese_Vert_At_Ku_Plus_Ten"    0x00050001     -                                  ""*
  35. "Mac_Traditional_Chinese"              0x00000002  "x-mac-chinesetrad"                   ""*
  36. "Mac_Korean"                           0x00000003  "x-mac-korean"                        ""*
  37. "Mac_Arabic"                           0x00000004  "x-mac-arabic"                        ""*
  38.  "Mac_Arabic_Standard"                 0x00000004  "x-mac-arabic"                        ""*
  39.  "Mac_Arabic_TrueType"                 0x00010004     -                                  ""*
  40.  "Mac_Arabic_Thuluth"                  0x00020004     -                                  ""*
  41.  "Mac_Arabic_AlBayan"                  0x00030004     -                                  ""*
  42. "Mac_Hebrew"                           0x00000005  "x-mac-hebrew"                        ""*
  43.  "Mac_Hebrew_Standard"                 0x00000005  "x-mac-hebrew"                        ""*
  44.  "Mac_Hebrew_Figure_Space"             0x00010005     -                                  ""*
  45. "Mac_Greek"                            0x00000006  "x-mac-greek"                         ""*
  46. "Mac_Cyrillic"                         0x00000007  "x-mac-cyrillic"                      ""*
  47.  "Mac_Cyrillic_Old_Standard"           0x00010007     -                                  ""•
  48.  "Mac_Cyrillic_Old_Ukrainian"          0x00020007     -                                  ""•
  49.  "Mac_Cyrillic_Euro_Sign"              0x00030007     -                                  ""•
  50. "Mac_Devanagari"                       0x00000009  "x-mac-devanagari"                    ""*
  51. "Mac_Gurmukhi"                         0x0000000A  "x-mac-gurmukhi"                      ""*
  52. "Mac_Gujarati"                         0x0000000B  "x-mac-gujarati"                      ""*
  53. "Mac_Oriya"                            0x0000000C     -                                  ""
  54. "Mac_Bengali"                          0x0000000D     -                                  ""
  55. "Mac_Tamil"                            0x0000000E     -                                  ""
  56. "Mac_Telugu"                           0x0000000F     -                                  ""
  57. "Mac_Kannada"                          0x00000010     -                                  ""
  58. "Mac_Malayalam"                        0x00000011     -                                  ""
  59. "Mac_Sinhalese"                        0x00000012     -                                  ""
  60. "Mac_Burmese"                          0x00000013     -                                  ""
  61. "Mac_Khmer"                            0x00000014     -                                  ""
  62. "Mac_Thai"                             0x00000015  "x-mac-thai"                          ""*
  63. "Mac_Laotian"                          0x00000016     -                                  ""
  64. "Mac_Georgian"                         0x00000017     -                                  ""
  65. "Mac_Armenian"                         0x00000018     -                                  ""
  66. "Mac_Simplified_Chinese"               0x00000019  "x-mac-chinesesimp"                   ""*
  67. "Mac_Tibetan"                          0x0000001A  "x-mac-tibetan"                       ""•
  68. "Mac_Mongolian"                        0x0000001B     -                                  ""
  69. "Mac_Ethiopic"                         0x0000001C     -                                  ""
  70. "Mac_Central_European"                 0x0000001D  "x-mac-centraleurroman"               ""*
  71. "Mac_Vietnamese"                       0x0000001E     -                                  ""
  72. "Mac_Arabic_Extended"                  0x0000001F     -                                  ""
  73. "Mac_Symbol"                           0x00000021  "x-mac-symbol"                        ""*
  74. "Mac_Dingbats"                         0x00000022  "x-mac-dingbats"                      ""*
  75. "Mac_Turkish"                          0x00000023  "x-mac-turkish"                       ""*
  76. "Mac_Croatian"                         0x00000024  "x-mac-croatian"                      ""*
  77.  "Mac_Croatian_Euro_Sign"              0x00000024  "x-mac-croatian"                      ""*
  78.  "Mac_Croatian_Old"                    0x00010024     -                                  ""*
  79. "Mac_Icelandic"                        0x00000025  "x-mac-icelandic"                     ""*
  80.  "Mac_Icelandic_Euro_Sign_Standard"    0x00000025  "x-mac-icelandic"                     ""*
  81.  "Mac_Icelandic_Old_Standard"          0x00020025     -                                  ""*
  82.  "Mac_Icelandic_Old_TrueType"          0x00030025     -                                  ""*
  83.  "Mac_Icelandic_Euro_Sign_TrueType"    0x00050025     -                                  ""*
  84. "Mac_Romanian"                         0x00000026  "x-mac-romanian"                      ""*
  85.  "Mac_Romanian_Euro_Sign"              0x00000026  "x-mac-romanian"                      ""*
  86.  "Mac_Romanian_Old"                    0x00010026     -                                  ""*
  87. "Mac_Celtic"                           0x00000027     -                                  ""
  88. "Mac_Gaelic"                           0x00000028     -                                  ""
  89. "Mac_Farsi"                            0x0000008C  "x-mac-farsi"                         ""*
  90.  "Mac_Farsi_Standard"                  0x0000008C  "x-mac-farsi"                         ""*
  91.  "Mac_Farsi_TrueType"                  0x0001008C     -                                  ""*
  92. "Mac_Ukrainian"                        0x00000098  "x-mac-ukrainian"                     "in TEC 1.5 mapped to Mac_Cyrillic"*
  93. "Mac_Inuit"                            0x000000EC     -                                  ""
  94. "Mac_VT100"                            0x000000FC  "x-mac-vt100"                         ""*
  95.  "Mac_VT100_Euro_Sign"                 0x000000FC  "x-mac-vt100"                         ""*
  96.  "Mac_VT100_Old"                       0x000100FC     -                                  ""*
  97.  
  98. "Unicode_1_1"                          0x00000101  "UNICODE-1-1"                         "default Standard 16 Bit"*
  99.  "Unicode_1_1_16_Bit"                  0x00000101  "UNICODE-1-1"                         "same as Standard"*
  100.  "Unicode_1_1_Standard"                0x00000101  "UNICODE-1-1"                         "16 Bit"*
  101.  "Unicode_1_1_No_Compatibility"        0x00010101     -                                  ""
  102.  "Unicode_1_1_Canonical_Decomposition" 0x00020101     -                                  ""
  103.  "Unicode_1_1_No_Composed"             0x00030101     -                                  ""
  104.  "Unicode_1_1_No_Corporate"            0x00040101     -                                  ""
  105.  
  106.  "Unicode_1_1_UTF_7"                   0x04000101  "UNICODE-1-1-UTF-7"                   "7 Bit"*
  107.  "Unicode_1_1_UTF_8"                   0x08000101  "UNICODE-1-1-UTF-8"                   "8 Bit"*
  108.  
  109. "Unicode"                              0x00000103  "UNICODE-2-0"                         "default to Unicode 2.1 16 Bit"*
  110. "Unicode_2_0"                          0x00000103  "UNICODE-2-0"                         "New location for Korean Hangul"*
  111. "Unicode_2_1"                          0x00000103  "UNICODE-2-0", "UTF-16"               "We treat both Unicode 2.0 and Unicode 2.1 as 2.1"*
  112.  "Unicode_2_1_16 Bit"                  0x00000103  "UNICODE-2-0", "UTF-16"               "same as Standard"*
  113.  "Unicode_2_1_Standard"                0x00000103  "UNICODE-2-0", "UTF-16"               "16 Bit"*
  114.  "Unicode_2_1_No_Compatibility"        0x00010103     -                                  ""
  115.  "Unicode_2_1_Canonical_Decomposition" 0x00020103     -                                  ""•
  116.  "Unicode_2_1_No_Composed"             0x00030103     -                                  ""
  117.  "Unicode_2_1_No_Corporate"            0x00040103     -                                  ""
  118.  
  119.  "Unicode_2_1_UTF_7"                   0x04000103  "UNICODE-2-0-UTF-7", "UTF-7"          "7 Bit"*
  120.  "Unicode_2_1_UTF_8"                   0x08000103  "UNICODE-2-0-UTF-8", "UTF-8"          "8 Bit"*
  121.  
  122. "ISO_Latin_1"                          0x00000201  "ISO-8859-1", "latin1"                "ISO 8859-1"*
  123. "ISO_Latin_2"                          0x00000202  "ISO-8859-2", "latin2"                "ISO 8859-2"*
  124. "ISO_Latin_3"                          0x00000203  "ISO-8859-3", "latin3"                "ISO 8859-3"•
  125. "ISO_Latin_4"                          0x00000204  "ISO-8859-4", "latin4"                "ISO 8859-4"•
  126. "ISO_Latin_Cyrillic"                   0x00000205  "ISO-8859-5", "cyrillic"              "ISO 8859-5"*
  127. "ISO_Latin_Arabic"                     0x00000206  "ISO-8859-6", "arabic"                "ISO 8859-6, = ASMO 708, =DOS CP 708"*
  128. "ISO_Latin_Greek"                      0x00000207  "ISO-8859-7", "greek"                 "ISO 8859-7"*
  129. "ISO_Latin_Hebrew"                     0x00000208  "ISO-8859-8", "hebrew"                "ISO 8859-8"*
  130. "ISO_Latin_5"                          0x00000209  "ISO-8859-9", "latin5"                "ISO 8859-9, Turkish"*
  131. "ISO_Latin_6"                          0x0000020A     -                                  "ISO 8859-10"
  132. "ISO_Latin_7"                          0x0000020D     -                                  "ISO 8859-13, Baltic Rim"
  133. "ISO_Latin_8"                          0x0000020E     -                                  "ISO 8859-14, Celtic"
  134. "ISO_Latin_9"                          0x0000020F, "ISO-8859-15", "latin9"               "ISO 8859-15, 8859-1 changed for EURO & CP1252 letters"•
  135.  
  136. "DOS_Latin_US"                         0x00000400  "cp437"                               "CP 437"*
  137. "DOS_Greek"                            0x00000405     -                                  "CP 737 (formerly CP 437G)"
  138. "DOS_Baltic_Rim"                       0x00000406     -                                  "CP 775"
  139. "DOS_Latin_1"                          0x00000410  "cp850"                               "CP 850  <Multilingual>"*
  140. "DOS_Greek_1"                          0x00000411     -                                  "CP 851"
  141. "DOS_Latin_2"                          0x00000412     -                                  "CP 852, Slavic"
  142. "DOS_Cyrillic"                         0x00000413     -                                  "CP 855, IBM Cyrillic"
  143. "DOS_Turkish"                          0x00000414     -                                  "CP 857, IBM Turkish"
  144. "DOS_Portuguese"                       0x00000415     -                                  "CP 860"
  145. "DOS_Icelandic"                        0x00000416     -                                  "CP 861"
  146. "DOS_Hebrew"                           0x00000417     -                                  "CP 862"
  147. "DOS_Canadian_French"                  0x00000418     -                                  "CP 863"
  148. "DOS_Arabic"                           0x00000419  "cp864"                               "CP 864"*
  149. "DOS_Nordic"                           0x0000041A     -                                  "CP 865"
  150. "DOS_Russian"                          0x0000041B  "cp866"                               "CP 866"
  151. "DOS_Greek_2"                          0x0000041C     -                                  "CP 869, IBM Modern Greek"
  152. "DOS_Thai"                             0x0000041D  "cp874"                               "CP 874, also for Windows"*
  153. "DOS_Japanese"                         0x00000420     -                                  "CP 932, also for Windows; Shift-JIS with additions"*
  154. "DOS_Simplified_Chinese"               0x00000421     -                                  "CP 936, also for Windows; was EUC-CN, now GBK (EUC-CN extended)"*
  155. "DOS_Korean"                           0x00000422     -                                  "CP 949, also for Windows; Unified Hangul Code (EUC-KR extended)"
  156. "DOS_Traditional_Chinese"              0x00000423     -                                  "CP 950  also for Windows; Big-5"*
  157. "Win_Latin_1"                          0x00000500  "windows-1252", "cp1252"              "CP 1252"*
  158. "Win_ANSI"                             0x00000500  "windows-1252", "cp1252"              "CP 1252 (alternate name)"*
  159. "Win_Latin_2"                          0x00000501  "windows-1250", "cp1250"              "CP 1250  Central Europe"*
  160. "Win_Cyrillic"                         0x00000502  "windows-1251", "cp1251"              "CP 1251, Slavic Cyrillic"*
  161. "Win_Greek"                            0x00000503  "windows-1253", "cp1253"              "CP 1253"*
  162. "Win_Latin_5"                          0x00000504  "windows-1254", "cp1254"              "CP 1254, Turkish"*
  163. "Win_Hebrew"                           0x00000505  "windows-1255", "cp1255"              "CP 1255"*
  164. "Win_Arabic"                           0x00000506  "windows-1256", "cp1256"              "CP 1256"*
  165. "Win_Baltic_Rim"                       0x00000507  "windows-1257", "cp1257"              "CP 1257"•
  166. "Win_Vietnamese"                       0x00000508  "windows-1258", "cp1258"              "CP 1258"•
  167. "Win_Korean_Johab"                     0x00000510     -                                  "CP 1361, for Windows NT"
  168.  
  169. "Western_ASCII"                        0x00000600  "US-ASCII"                            ""*
  170. "Japanese_JIS_X0201_76"                0x00000620     -                                  "JIS Roman and 1-byte katakana (halfwidth)"
  171. "Japanese_JIS_X0208_83"                0x00000621     -                                  ""
  172. "Japanese_JIS_X0208_90"                0x00000622  "JIS_C6226-1983"                      ""*
  173. "Japanese_JIS_X0212_90"                0x00000623     -                                  ""
  174. "Japanese_JIS_C6226_78"                0x00000624     -                                  ""
  175. "Simplified_Chinese_GB_2312_80"        0x00000630  "csISO58GB231280"                     ""*
  176. "Chinese_GBK_95"                       0x00000631  "X-GBK"                               "annex to GB 13000-93; for Windows 95; EUC-CN extended"*
  177. "Korean_KSC_5601_87"                   0x00000640  "csKSC56011987"                       "same as KSC 5601-92 without Johab annex"*
  178. "Korean_KSC_5601_92_Johab"             0x00000641     -                                  "KSC 5601-92 Johab annex"
  179. "CNS_11643_92_P1"                      0x00000651  "x-cns11643-1"                        "CNS 11643-1992 plane 1"
  180. "CNS_11643_92_P2"                      0x00000652  "x-cns11643-2"                        "CNS 11643-1992 plane 2"
  181. "CNS_11643_92_P3"                      0x00000653     -                                  "CNS 11643-1992 plane 3 (was plane 14 in 1986 version)"
  182.  
  183. "Japanese_ISO_2022_JP"                 0x00000820  "ISO-2022-JP"                         ""*
  184. "Japanese_ISO_2022_JP_2"               0x00000821     -                                  ""
  185. "Simplified_Chinese_ISO_2022_CN"       0x00000830  "ISO-2022-CN"                         ""*
  186. "Simplified_Chinese_ISO_2022_CN_EXT"   0x00000831     -                                  ""
  187. "Korean_ISO_2022_KR"                   0x00000840  "ISO-2022-KR"                         "EUC collections begin at 0x900"*
  188. "Japanese_EUC"                         0x00000920  "EUC-JP", "X-EUC-JP"                  "ISO 646, 1-byte katakana, JIS 208, JIS 212"*
  189. "Simplified_Chinese_EUC"               0x00000930  "GB2312", "X-EUC-CN"                  "ISO 646, GB 2312-80"*
  190. "Traditional_Chinese_EUC"              0x00000931  "X-EUC-TW"                            "ISO 646, CNS 11643-1992 Planes 1-16"*
  191. "Korean_EUC"                           0x00000940  "EUC-KR"                              "ISO 646, KS C 5601-1987"*
  192.  
  193. "Japanese_Shift_JIS"                   0x00000A01  "Shift_JIS", "x-sjis", "x-shift-jis"  "plain Shift-JIS"*
  194. "Cyrillic_KOI8_R"                      0x00000A02  "KOI8-R"                              "Russian internet standard"*
  195.  
  196. "Traditional_Chinese_Big_5"            0x00000A03  "Big5"                                ""*
  197.  "Traditional_Chinese_Big_5_Basic"     0x00000A03  "Big5"                                ""*
  198.  "Traditional_Chinese_Big_5_Standard"  0x00010A03     -                                  ""
  199.  "Traditional_Chinese_Big_5_ETen"      0x00020A03     -                                  ""
  200.  
  201. "Western_Mac_Mail"                     0x00000A04  "x-mac-latin1"                        "Mac OS Roman permuted to align with ISO Latin-1"*
  202. "Simplified_Chinese_HZ_GB_2312"        0x00000A05  "HZ-GB-2312"                          "HZ (RFC 1842, for Chinese mail & news)"*
  203. "Western_Next_Step"                    0x00000B01  "X-NEXTSTEP"                          "NextStep encoding"*
  204. "Western_EBCDIC_US"                    0x00000C01     -                                  "basic EBCDIC-US"
  205. "Western_EBCDIC_CP037"                 0x00000C02  "cp037"                               "CP 037, extended EBCDIC (Latin-1 set) for US, Canada..."*
  206. "Multi_Run"                            0x00000FFF     -                                  "Multi-encoding text with external run info"*
  207.  
  208. *)
  209.